All

沿指定轴计算张量的逻辑与 (Logical AND)。如果轴上的所有元素都为真(非零),则输出为1.0,否则为0.0。

\[Y_i = \prod_{x \in S_i} B(x)\]

其中 \(S_i\) 是输入张量中用于计算输出 \(Y_i\) 的切片, \(B(x)\) 是一个辅助函数:

\[\begin{split}B(x)=\begin{cases} 1, & \text{if } x \neq 0 \\ 0, & \text{if } x = 0 \end{cases}\end{split}\]
输入:
  • outer_size - 规约轴之前的所有维度大小的乘积。

  • inner_size - 规约轴之后的所有维度大小的乘积。

  • axis_size - 规约轴本身的大小。

  • src_data - 输入数据地址。

  • core_mask - 核掩码。

输出:
  • dst_data - 输出数据地址。

支持平台:

FT78NE MT7004

备注

  • FT78NE 支持int8, int16, int32, fp32, fp64, cplx64, cplx128

  • MT7004 支持fp16, fp32, int16, int32, cplx64

共享存储版本:

void i8_reduceall_s(int outer_size, int inner_size, int axis_size, int8_t *src_data, int8_t *dst_data, int core_mask)
void i16_reduceall_s(int outer_size, int inner_size, int axis_size, int16_t *src_data, int16_t *dst_data, int core_mask)
void i32_reduceall_s(int outer_size, int inner_size, int axis_size, int *src_data, int *dst_data, int core_mask)
void hp_reduceall_s(int outer_size, int inner_size, int axis_size, half *src_data, half *dst_data, int core_mask)
void fp_reduceall_s(int outer_size, int inner_size, int axis_size, float *src_data, float *dst_data, int core_mask)
void dp_reduceall_s(int outer_size, int inner_size, int axis_size, double *src_data, double *dst_data, int core_mask)
void c64_reduceall_s(int outer_size, int inner_size, int axis_size, float *src_data, float *dst_data, int core_mask)
void c128_reduceall_s(int outer_size, int inner_size, int axis_size, double *src_data, double *dst_data, int core_mask)

C调用示例:

 1//FT78NE示例
 2#include <stdio.h>
 3#include <all.h>
 4int main(int argc, char* argv[]) {
 5    float *src_data = (float *)0xA0000000;   //input在DDR空间
 6    float *dst_data = (float *)0xB0000000;   //output
 7    int outer_size = 2;
 8    int inner_size = 4;
 9    int axis_size = 3;
10    int core_mask = 0xff;
11    fp_reduceall_s(outer_size, inner_size, axis_size, src_data, dst_data, core_mask);
12    return 0;
13}

私有存储版本:

void i8_reduceall_p(int outer_size, int inner_size, int axis_size, int8_t *src_data, int8_t *dst_data)
void i16_reduceall_p(int outer_size, int inner_size, int axis_size, int16_t *src_data, int16_t *dst_data)
void i32_reduceall_p(int outer_size, int inner_size, int axis_size, int *src_data, int *dst_data)
void hp_reduceall_p(int outer_size, int inner_size, int axis_size, half *src_data, half *dst_data)
void fp_reduceall_p(int outer_size, int inner_size, int axis_size, float *src_data, float *dst_data)
void dp_reduceall_p(int outer_size, int inner_size, int axis_size, double *src_data, double *dst_data)
void c64_reduceall_p(int outer_size, int inner_size, int axis_size, float *src_data, float *dst_data)
void c128_reduceall_p(int outer_size, int inner_size, int axis_size, double *src_data, double *dst_data)

C调用示例:

 1//FT78NE示例
 2#include <stdio.h>
 3#include <all.h>
 4int main(int argc, char* argv[]) {
 5    float *src_data = (float *)0x10000000;   //input在DDR空间
 6    float *dst_data = (float *)0x10001000;   //output
 7    int outer_size = 2;
 8    int inner_size = 4;
 9    int axis_size = 3;
10    fp_reduceall_p(outer_size, inner_size, axis_size, src_data, dst_data);
11    return 0;
12}